import openai

client = openai.Client(
    base_url="http://localhost:8000/v1",
    api_key="EMPTY"
)

response = client.chat.completions.create(
    model="/root/workspace/llm_models/MiniCPM4-8B",
    messages=[
        {"role": "user", "content": "你好！"}
    ],
    temperature=0.7,
    max_tokens=1024,
    extra_body={
        "add_special_tokens": True,
    }
)

print(response.choices[0].messages.content)
